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Promoter DNA sequence of the extracellular invertase NIN88 from tobacco 



1 TCTAGAATGA 

51 TCGTTCAACT 

101 TCTTATCCTC 

151 GGGCCACTCC 

201 TCGTAAAGTG 

251 TATCTGACTT 

301 TG AGTG ATT A 

351 G ATCG AAACG 

401 GTAAGGGTGG 

451 TTGGTCCTTC 

501 C ATGTCC ATG 

551 CTCGCTCTTG 

601 TCTG ACCTC A 

651 TGCATAGACT 

701 AAGAGGGCAT 

751 GGGCCCTCTT 

801 TTG ATCCATT 

851 CATTTTGACG 

901 GTTGGCCCAT 

951 GTTGTGTATT 

1001 ACAGTTTTCT 

1051 GTTGCTACAA 

1101 GTTGAATCGA 

1151 TGGCAAATAT 

1201 GCCATTATGA 

1251 GGGCAGCTGT 

1301 ACATTTTCAA 

1351 TTTACCGCAG 

1401 TCATAAATTT 

1451 TGGGGCGGCT 

1501 TTTTTGGAAA 

1551 TGTTCTCTCA 

1601 CATTTTCTTC 

1651 TGTGAGTGAT 

1701 GCTGGTGCAA 

1751 TTTGTTGAGG 

1801 TCTTCACCGC 

1851 CCGCGGGATG 

1901 GGGAGAGGTG 

1951 TGATGGTGTT 

2001 TCTTCTCCCT 

2051 CTTCTCTTCT 

2101 CTAAAGTTTT 

2151 AAAAAATATA 

2201 TAAACCTAGT 

2251 TCACGGTCAT 

2301 ATTTCAAGAT 

2351 ATGGCATTAA 

2401 GGATGATTCT 

2451 TTGGGACCCT 

2501 GAATCTCTTT 

2551 CTTTTCAAAG 

2601 ATCTCTTTTT 

2651 ATACACCAAG 

2701 AACTAGCTGT 

2751 GCCCTGre AT 

2801 CTTCATGTCA 

2851 ACAAAATTGC 

2901 ACTGTTATAG 

2951 TTCTTTTCAT 

3001 AACTATAT AT 



CGCCACCGGC 

GCATTGTTAA 

GAGTTTCATT 

CATCGTCCAC 

ATAACGAGGG 

ATCGAAGATG 

ACTGTTTGAG 

TCGTCTCCGC 

r-TTCGGCGGT 

ZTCGGTCACA 

ACCTCTTGTC 

3TGGAACTCG 

rCTTTTGTGG 

ATTTCTGAGG 

ACCTCTCTCG 

CGTAGCGGGA 

TCTCGGTTAG 

ATCCTTCCTG 

TCAGGTCGTC 

rCATCCCAAG 

GGTCGCCCTC 

CCATTCCTTC 

3CGAGGAAGT 

ATCGTTCACT 

A.CTTGTCGGC 

CAATACCAAG 

CAAGATGGAG 

TGACATAATG 

TCAGATAAGG 

TCATCAeTGT 

TATTTTTGGG 

TTTGATCCCG 

AGAATGGCCG 

ACCTGTTACT 

TGCAAGTCCT 

A.TGCCGGTCA 

TGGTGGCGCC 

TTGCGATACT 

TTAGGCGTTA 

TAAGAGGTTG 

TACCTGCCAT 

TCTTTTTTGT 

AACTAGACTA 

GACTTTTGAT 

TAATGATAAT 

AGCAGCGTTG 

CATTAATGAT 

AGTAAATAAG 

TCTTTTTGAC 

TCTCGGATCT 

AGAAAGGTAG 

AATATTTTTA 

CTATTTATAT 

AATATTCAAT 

TAGCACTCGA 

TTACTAATCX5 

AATCTTAATG 

TTCCAAAGAA 

AAAGATCTGA 

ATCTAAGG AG 

CAAAGGAATG 



CAGGACGGGG 

aacx:tgttag 
tgtgcaagta 
cataatgcgt 
catcatagtg 
atactttctt 
cttgtgggtt 
ccgcgatgat 
ccctggtgtt 
caacaatatt 
ttagggcgat 
cagagggcat 
ccactttact 

GTGACACACA 
TTCCX5GTGAG 
GAGGGGCATG 
ATCATGGAGC 
GTTTCGGCTT 
TTCX5TCGGCA 
TGGTTGGAGG 
GAGCCATTCA 
TGATACATTC 
CCCTCAATCC 
CTTGCCTCCG 
CATCTCTTCG 
TCAATGCTCC 
GAGACTTGTT 
ATTACATGAT 
TGGCATCTTG 
AGGGTTGCTC 
GCACCCGGTA 
AAGCATTTTA 
TGAGGGTGTC 
GAAGGGGGAG 
TGCATTTTCT 
GCATATTTGT 
TCTTCCGTTG 
GCTGTGAGGG 
TGCCTTCGCC 
GTAGTGAGAT 
GTCAGATCTG 
GAATTGTGCC 
TCCTCACAGA 
TAAATTAATT 
AACTTCAGAT 
AGAGAAGATT 
AGGGGAATAT 
GAGAATGATT 
AATGATGAAT 
AATGAAAAAA 
TGATTGTCTT 
TCAGAGAATA 
GGGACATTCC 
AAAATATTTT 
CCTCGGTCGY 
ACCTCGATTA 
AAAGCAGATT 
AACATGGCTC 
ATTTATTTAT 
TAAAGCAACC 
GTGTTTTTTC 



AGTATGATTT 
CX3TGATGCAG 
CTCGAGGATG 
CTTACATCTG 
AGGGAAAACC 
TAAGTTTCTC 

gtggcgaact 
aatgtgaatg 
gttcacgtcc 
ttgaggtgtc 
acaatcctca 
ctgattttct 
tttggtccga 
aaatttgtga 
tccctgtcct 
atggcacttt 
tgcaagatct 
gtaccgaggt 
cgggcctcag 
atatttcata 
tgttcagccc 
ggtaaggtca 
ctctccgagt 
cgtttttagc 
aatatttctuv 
tcxtggtaagg 
ctttggagag 
cttcx3gggtc 
aacgtcttgg 
gactaaccga 
ttttatcgac 

TTTTCGTTTT 

attacctgca 
ggtcgtgctg 
ctaaatacct 
cagccaagct 
tggacgtgga 
aggggtgatc 
ttctatttcg 
tggccactgc 
ggtgtacaag 
agttatagat 
cggcgccaaa 
aatattgtat 
ctataatcaa 
aaatgtgatg 
caagcaataa 
cacccaatat 
gatgggcaaa 
gtatggaata 
ttatctagag 

TTACATCCCC 
TCAATCAATC 
TTTGAATATT 
TATTGACTAC 
CATCACTTTC 
TTGACCCATA 
TTATAGTGAA 
AAGAATAGTG 
ATGAATAGAA 
TTTAAATATG 



CCCCGAATGT 
CCCGGTACTA 
GACAATTCAC 
TATCTAATAT 
AAACCGTGGT 
GTACCGTTC.A 
TTACGTTGTT 
GTGCX3AGTCG 
TCGAGAAAAG 
CTTGATGAAG 
GTTTTGTGAC 
AGTGCTTGGA 
GCTTCTTCA-A 
GCGGATAGTA 
TGGCCTAGAT 
TGACATATGG 
CTCTTGGCAT 
CAATCGATGA 
CACAGTAGGC 
AGTTGGTTTA 
ATTCTGGAAA 
TCCTTACTCT 
GATTGTTTGA 
CCCAACATGG 
TGGAGCGCGC 
GTCTCX5CCGA. 
ATCATTGCXrC 

ggtcgtacx:a 
gtatggcata 

CCAGCGTCTC 
TCTTTCTTGG 
CCATTTCTTC 
TTATTAATAT 
TTTGGTCATT 
CCTGAGTGGG 
TCGAGTAGCT 
AGCTCCTTTA 
CACTTCGTCG 
GAGACCTCAT 
CTTCATCCTT 
GAAGTAGGAG 
CTAAAAGAAA 
TTGTTTGACC 
GACAAAGGAT 
TTAACAGCAA 

tycattcaat 
ataacgataa 
tgaatgaggt 
tactagaatg 
gtagataatc 
agaaagtctg 
CTCTCTCCxrr 
ctaaaagtac 
ctattataaa 
tcggttacga 
tacgatactg 
caAtaatatg 
atatcgttag 
tttttttctt 
aaggcttagt 
gataaaaai^^ 
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3051 TCTCAATATA 

3101 agcagaggcx? 

3151 tccggtaaag 

3201 aaaactgacc 

3251 ggaaaggaat 

3301 cx5gtcaatta 

3351 gatcggtatt 

3401 ccx5gggtctg 

3451 cattttgttt 

3501 ttttgcacga 

3551 aattacttac 

3601 cx5accaattt 

3651 gaaaaactaa 

3701 ctcaaaaata 

3751 ggtcggtttc 

3801 cgacx:aactt 

3851 gtgggtcgac 

3901 ctgtaagctt 

3951 ATCAT TAATT 

4001 CACTAGATGA 

4051 CGCCTATGAT 

4101 GAGCTCCAGA 

4151 ACTATGACTT 

4201 TTCTCCATTG 

4251 AAGAAGAAGA 

4301 ATAGGGAAAA 



GAAGATTAGA 
GACCTATGTG 
ATCGATCAAA 
AAAACGCGAT 
ACCGACCAAA 
AATTCAAAAA 
TTAATTATGT 
TACTATGGCA 
TAAGACTGTC 
AAA.TAACCGA 
CAAAGTTGGT 
TGGTAGGTTT 
CCAAAGTTAG 
GTTTCCCGCA 
GTAAAAAAAA 
TAGTCGGTTT 
CTTGGTCGGT 
CGGGAGAAM. 



TCAATTAACA 
TTATAGTAAG 
AAACXrGACCA 
CATTTACGTG 
GTTGGTCGGA 
7AATATTGTA 
AATAAAAAGA 
AGATACTATT 
TTTTATTTGA 
CCAAAGTTGG 
CGATTTTTTT 
TTTTAATATf 
TCGGTTTCTT 
TTTTTGCGCX: 
AAAAAATTTA 
TTTGGTCGAT 
TTTTGCCGAA 
TTTGTATATG 



AAGGTTATGG 
GGGTCACCCA 
ACATTGGTCG 
TGAACX5GTAT 
AATTACCGAC 
AAAAAAAACC 
TTCACTATCT 
CTACCACTAG 
TTTATACTCT 
TCGATTTTAT 
AAATGATCCX5 
AATTTTTATT 
GAAACATAAA 
AAAGAAAACC 
AAAAATATAT 
TTTTTGACCG 
TT TCTAGTAG 
TATAT GTGTA 



TG GAGTGGTA 
CTACTAGAAA 
GTAATGGCCA 
TTTTATGGTC 
CAACTTTGGT 
GACCAAAGTT 
GGGAATCGAA 
ACCATTGGTT 
TTAATTATAT 
TAAAAAGTAA 
CXTGAATTAAC 
TATTTTAATT 
TTTCGCGGGA 
GACCAAAGTT 
TTTAAAAAAC 
ACCAAAGTTG 
TGACCGAACC 



TAAAGAACGT 
GCAGAATT^C 
GGTAAGTACT 
TATAAACTAT 
CATCTGATTT 
TTCAGTTTCT 
AGAAGAAGAA 



GGCACCCTGA 
GTGTTCTCGT 
TCTTCGTCCT 
AGACTCGTCT 
CTCTATAftAT 
TTCTCCACAT 
AAATAAAGAG 



ATACTAGAAG 
CGCGTAAAAA 
TAATCAGAGG 
TTATAGCACC 
ACTCCTCAAG 
CACAGAAGTG 
TTTCTGTCAA 



TATCCTTAAA 
CCTTTAGGGG 
TACTTGGATC 
TTTCGACTTC 
TTTTAATAAG 
CTTTCGGTTC 
AAAACAAAAC 
ATTAAGTCCA 
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Expression of NIN88-promotor 
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Germination rate (% of viable pollen) 
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Starch accumulation (% of pollen with positive starch staining) 
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Fig. 12 
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Fig. 13A 



Fig. 13B 
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Genomic sequence of NINSS 

1 ATGGAGCTGT TTAGAAAAAG CTCTTTTCAT TGTGCTTTGC CAGTTTTCAT 
51 ATTATTGGTT TGCTTGTTTA TAATTTTATC TAACTATGTT GTGTTTGCTT 
101 TCAATTATGA CGTTTTTACG TGCTTCCAAT CCTCAAAAGA TGCTAATATC 
151 ACTTCTAACT ACAGAACTGG TTACCATTTT CAACCCCCCA AGAACTGTAT 
201 GAATGGTACG TTTCTCTCCC CTTCCACCCA CCCCACCCCC TCTTCTGTTG 
251 TTGCTTTTGA TATGTGTATA TATATATATA TATCCATTTT TTGCTCGGTA 
301 TCGGCATTAG GATCCACTAA ATTCGGCATT GAGGGGTAAT TAGGCGTCTA 
351 ACAAAGTCAA TTCCATAACT AGGGCTCGAA CCCGAGACTT CCGATTAAAA 
401 ATGAAGGAGT ACTTAACACT TATTCTGTAA CATTAAACAA TAGACATCCT 
451 ACTCCTCTAA ACTCATTTGT ATTTTTAAAA TATCTATTTT ACCCTCGATC 
501 TTATTAGCCT TCATCTACTT tTTTTTTTTT TACTTTTTTA ATATCACAAT 

551 ATTTTCTTAT TCTATGTTAT GAATTTACCT ATAGTGAACA TAAAATTTAA 

601 AAAAGGTGAA AAACAATAAT CAATCATATA CTTATTGAAG TTAGAATAAT 

651 GAAACAAATG GGCGCAATTA AAATATTAGA ATAACAGATC TTATTAATAT 

701 CAATCAAATA AAATTTAGTT CAGTAATATA AAAAAATAAT TAAACATAGA 

751 GGTAGATTTT CTAAGAAATT CCTAAAAGAT TATATATTTA TAACTTAGAA 

801 AATATTTTGT TAATGAAAAT AAATATTCAA AGATATATAC AGAACAACAA 

851 CAACAACCCG ACCTTACCCC TACCCTGGGG TAGAGAGACT GTTTCCGATA 

901 GACCCTCGGC TCCCTCCCTC CAAGAACTCC CCACCTTGCC CTTGGGATGA 

951 CTCGAACTCA CAACCTCTTA GTTGGAAGTG GATGGTGCTT ACCACTAGAG 

1001 CAACCCGCTC TTGTCCGAAG ATATATACAG AAACATGTAA TAAAGAATAA 

1051 .AAGAGAAAGT AAAACTTAAA TATATAGATA ATATTAATGT AACGATAAAA 

1101 AAGAGTAACG ATAATTGTTT TTGCAAATTC ATAAAGGTAT TATTCTAGTT 

1151 AAATTTTATT GAGTTTTAAT TATATAATTT ATCATAAGAT ATTAAAATTG 

1201 GTAAAATACT TAGGCTAATG ATAAAATACA TCTTATATAA TATTAAAAAA 

12 51 AATAGAGGAG AAATTGAAAA TGTCAAGGGT AAAATAGAAA ATGCATATGA 

1301 TAGGAGGAGC GAAATATATA TTATTTAGTG TTGGAAGAGT GATTTGATTT 

1351 TTAAGATAAA ATTAGGGGAT GAAAATGATT TTTACACTTT AATAGATAGA 

1401 TCCTACTGAA ACACGTGTGA GTTCCAAAAG CAAAAAACGA AAAAGGAACC 

1451 AGCTCCCTAA TAATGAGTAC TTATTATACA AGTAAATACA ATTAGAGGAC 

1501 ACTAATTGCA ACCCCCTACT TGGGAACTGT CGGCCTATTG CTTTAATTAC 

1551 TTATACTCTC ACTCCGTTCA CTTTTACTTA TCCAATATTC TAAGTGACAT 

1601 TTGGACATAA GAATTGTAAA ATTCCAAAAT AGGAAAAAAA AATACAAGTG 

16 51 AAAATGTTAT TTGAAATTTA GAGTTACGTT TGGACATGAA TATAATTTTG 

17 01 GGTTGTTTTT AAAGTTTTGT GAGTGATTTG AGTGAAAATT TTGAAAAACA 
17 51 GTTTTTTGAA GTTTTTCAAA TTTTCGAAAA TTTTCAAAAT GCATCTTCAA 
1801 ATGAAAATTG AAAATTTTAT GAACAAACGC TGATTTCGAA AAAAA.^GTGA 
1851 TTTTTTTGTG GAAAAAAGAA AAAAATTTCT TATGTCCAAA CGGGCTCTAA 
1901 fiJ^^rAGATTT TCACTTTTAC TTGTCACTTT TCGCATATCA AGAGAAGACA 
1951 ATTTCTTTTT TTCTGTTATA CTCATAGTAT TAATTACTCA TTTCAAATCA 
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Fig. 15B 



2001 


TTTTTTCAAA 


TCCACTAAAA 


ATATGTATCA 


ATTAATATGG 


GTATTATGGT 


2051 


AAATTATGCA 


CTTCATTTAT 


TATTTCTTAA 


GGAGTGTTCA 


AAGTCCGTAG 


2101 


TAGACAAGTA 


AAAGTGAATG 


GAGAGAGTAA 


TAAATTACAC 


CTACTTTCTT 


2151 


GGAAATACCA 


GTTGAGACAT 


ACGTAGAACT 


TTTGCTAATT 


TTTTCTTATT 


2201 


TTTTCTTAAT 


TATATTATAT 


TTGTGTGTGA 


TATGGGCAGA 


AGGGGTTGGT 


2251 


AAGAAGGATC 


TTGTCCCCAT 


CAGCAACTTA 


CAATATTTTA 


GGGAAGACAA 


2301 


ATAATAATTT 


TCTGCATTTC 


CTAAATTTTT 


GTAATTTCAC 


TTTTCATTTG 


2351 


TTTATTATTT 


GATTATTCAT 


CAATATTAAA 


TTATGCAGAT 


TTAGTACTCA 


2401 


CATTCAATTG 


TTTATTTACA 


ATTTTTTTTA 


ATTTTTTTCT 


TTATGGTCTT 


2451 


TC.TCGATGCC 


TTCAAACATA 


CAAATAGACC 


CCAATGGTGA 


GTCAGAAATT 


2501 


TTATCTTCTT 


TTTATATATA 


TAATTTAATC 


ACCAATTATT 


CATTTATGAT 


2551 


ACTGATTTTT 


CATGTAATTA 


CCAACAGCAC 


CAATGTATTA 


CAATGGAGTC 


2601 


TATCATCTAT 


TCTACCAGTA 


CAATCCAAAA 


GGATCAACAA 


TGAACAACAT 


2651 


TGTTTGGGCT 


CATTCAGTCT 


CAAAAGACTT 


AATCAATTGG 


ATTAATTTAG 


2701 


AGCCTGCAAT 


TTATCCATCC 


AAACCATTTG 


ACAAATATGG 


AACATGGTCT 


2751 


GGTTCAGCAA 


CTATTCTCCC 


TGGTAACAAG 


CCCATTATTT 


TGTACACTGG 


2801 


AGTGGTAGAT 


GCCAACATGA 


CCCAAGTCCA 


AAATTACGCC 


GTCCCGGCCA 


2851 


ACTTATCCGA 


TCCATATCTC 


CGTGAATGGA 


ACAAGCCCGA 


TAACAACCCG 


2901 


TTGATCGTCC 


CGGATATCAG 


CATCACCAAG 


ACCCAATTTC 


GTGACCCGAC 


2951 


AACAGCTTGG 


ATGGGCAAAG 


ATGGTCATTG 


GAGAATTGTG 


GTAGGAAGTT 


3001 


CAAGAAACCG 


TGGTGGGTTG 


GCAATATTGT 


ATAGAAGTAG 


GAATTTCATG 


3051 


AAATGGATCA 


AGGCTGAGCA 


TCCACTTCAT 


TCATCTGCCA 


AAACAGGAAA 


3101 


TTGGGAATGC 


CCAGATTTTT 


TTCCTGTTTC 


CTTGCAAGGT 


TCTAATGGTT 


3151 


TAGATGCATC 


GTACAACGGA 


AAATATGTTA 


AGTACGTTCT 


CAAGAATAGC 


3201 


CTTCCTGTTG 


CCGCGTTTGA 


GTACTACACA 


ATTGGTACAT 


ATGATGCCAA 


3251 


ACAAGATAGG 


TATATTCCAG 


ATAACACTTC 


AGTCGATGGT 


TGGAAAGGAT 


3301 


TGAGACTTGA 


CTATGGCATT 


TTCTACGCGT 


CTAAGTCGTT 


CTACGACCCT 


3351 


AGTAAGGACC 


GAAGAATCGT 


GTGGGGTTGG 


TCTTATGJ\AT 


TAGATGGTCT 


3401 


CCCCAATAAT 


GAAAACAACA 


AAGGATGGGC 


CTGGAATTCA 


GGCTATCCCG 


3451 


CGTAAAGTAT 


GGCTTGATTT 


CAGTGGTAAA 


CAATTAGTTC 


AATGGCCTAT 


3501 


TGAAGAATTA 


AAAACTCTAA 


GAAAGCAAAA 


TGTCCGATTG 


AGCAACAAAA 


3551 


GGCTGGATAA 


TGGAGAAAAG 


ATTGAAGTTA 


AAGGAATCAC 


AGCGTCGCAG 


3601 


GTTTAGACTT 


TTTTCTAGTT 


TTTAATTTGC 


AAGCATTTTA 


AATAAAATTT 


3651 


TCTTCACAAG 


TTAAGGCTAA 


GTTGGGACAT 


CTATTGAAAT 


TGCCAGGCTG 


3701 


ATGTTGAAGT 


GACATTCTCC 


TTCTCTAGCT 


TAGACAAGGC 


AGAGCCATTT 


3751 


GATCCTAGTT 


GGGCTGATCT 


TTATGCACAA 


GATGTTTGTG 


CAATTAAGGG 


3801 


TTCAACTGTT 


CCAGGTGGGC 


TTGGGCCATT 


TGGCCTTGCA 


ACATTGGCTT 


3851 


CTCAAAACTT 


AGAAGAATAC 


ACACCTGTTT 


TTTTCAGAGT 


GTTCAAAGCT 


3901 


CAGAATTT 
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Sequence of NIN88 promoter fused with NIN88 antisense 



1 


TCGAGCCATT 


CATGTTCAGC 


CCATTCTGGA 


AAGTTGCTAC 


AACCATTCCT 


51 


TCTGATACAT 


TCGGTAAGGT 


CATCCTTACT 


CTGTTGAATC 


GAGCGAGGAA 


101 


GTCCCTCAAT 


CCCTCTCCGA 


GTGATTGTTT 


GATGGCAAAT 


ATATCGTTCA 


151 


CTCTTGCCTC 


CGCGTTTTTA 


GCCCCAACAT 


GGGCCATTAT 


GAACTTGTCG 


201 


GCCATCTCTT 


CGAATATTTC 


AATGGAGCGC 


GCGGGCAGCT 


GTGAATACCA 


251 


AGTCAATGCT 


CCTCCGGTAA 


GGGTCTCGCC 


GAACATTTTC 


AACAAGATGG 


301 


AGGAGACTTG 


TTCTTTGGAG 


AGATCATTGC 


CCTTTACCGC 


AGTGACATAA 


351 


TGATTACATG 


ATCTTCGGGG 


TCGGTCGTAC 


CATCATAAAT 


TTTCAGATAA 


401 


GGTGGCATCT 


TGAACGTCTT 


GGGTATGGCA 


TATGGGGCGG 


CTTCATCACT 


451 


GTAGGGTTGC 


TCGACTAACC 


GACCAGCGTC 


TCTTTTTGGA 


AATATTTTTG 


501 


GGGCACCCGG 


TATTTTATCG 


ACTCTTTCTT 


GGTGTTCTCT 


CATTTGATCC 


551 


CGAAGCATTT 


TATTTTCGTT 


TTCCATTTCT 


TCCATTTTCT 


TCAGAATGGC 


601 


CGTGAGGGTG 


TCATTACCTG 


CATTATTAAT 


ATTGTGAGTG 


ATACCTGTTA 


651 


CTGAAGGGGG 


AGGGTCGTGC 


TGTTTGGTCA 


TTGCTGGTGC 


AATGCAAGTC 


701 


CTTGCATTTT 


CTCTAAATAC 


CTCCTGAGTG 


GGTTTGTTGA 


GGATGCCGGT 


751 


CAGCATATTT 


GTCAGCCAAG 


CTTCGAGTAG 


CTTCTTCACC 


GCTGGTGGCG 


801 


CCTCTTCCGT 


TGTGGACGTG 


GAAGCTCCTT 


TACCGCGGGA 


TGTTGCGATA 


851 


CTGCTGTGAG 


GGAGGGGTGA 


TCCACTTCGT 


CGGGGAGAGG 


TGTTAGGCGT 


y U 1 


TATGCCTTCG 


CCTTCTATTT 


CGGAGACCTC 


ATTGATGGTG 


TTTAAGAGGT 


y D 1 




ATTGGCCACT 


GCCTTCATCC 


TTTCTTCTCC 


CTTACCTGCC 


1 n n 1 


A i (j 1 C ACjj ATC 


TGGGTGTACA 


TV TV TW /~^m TV 

AGGAAGTAGG 


AGCTTCTCTT 


CTTCTTTTTT 


lU D ± 


VjUjAAI 1(j1Xj 


t^t^ A /^rnrri a in a 

C C AGTT AT AG 


TV my^/n TV TV TV Ti ^ 

ATCTAAAAGA 


AACTAAAGTT 


TTAACTAGAC 


1 1 m 




GACGGCGCCA 


A A 1 i U 1 1 11 Hi 1 1^*1 IV 

AATTGTTTGA 


CCAAAAAATA 


TAGACTTTTG 


i i D 1 


A rrifTi AAA rrUTl A A 

ATTAAATTAA 


TTAATATTGT 


ATGACAAAGG 


ATTAAACCTA 


GTTAATGATA 


iz U i 


ATAACTTCAG 


ATCTATAATC 


AATTAACAGC 


AATCACGGTC 


ATAGCAGCGT 


1 O C 1 

jiZ b 1 


fTU^ A A A A A 

TGAGAGAAGA 


fnm TV TV TV my^iTij'^ t^, 

TTAAATGTGA 


TGTnCATTCA 


ATATTTCAAG 


ATCATTAATG 


1 J Ul 


A rn A /^^^^^/^ A A fT* 

ATAGGGGAAT 


A m/^ A A /^/^ A m 

ATCAAGCAAT 


TV TV ^ m Th Ik ^ m 

AAATAACGAT 


AAATGGCATT 


AAAGTAAATA 


1 J D 1 


AGGAGAATGA 


TTCACCCAAT 


ATTGAATGAG 


GTGGATGATT 


CTTCTTTTTG 


1401 


AC AATG ATG A 


ATGATGGnCA 


AATACTAGAA 


TGTTGGGACC 


CTTCTCGGAT 


14 51 


CTAATGAAAA 


AAGTATGGAA 


TAGTAGATAA 


TCGAATCTCT 


TTAGAAAGGT 


1501 


AGTGATTGTC 


TTTTATCTAG 


AGAGAAAGTC 


TGCTTTTCAA 


AGAATATTTT 


1551 


TATCAGAGAA 


TATTACATCC 


CCCTCTCTCC 


CTATnTCTTT 


TTCTATTTAT 


1601 


ATGGGACATT 


CCTCAATCAA 


TCCTAAAAGT 


ACATACACCA 


AGAATATTCA 


1651 


ATAAAATATT 


TTTTTGAATA 


TTCTATTATA 


AAAACTAGCT 


GTTAGCACTC 


1701 


GACCTCGGTC 


GnTATTGACT 


ACTCGGTTAC 


GAGCCCTGTC 


ATTTACTAAT 


1751 


CGACCTCGAT 


TACATCACTT 


TCTACGATAC 


TGCTTCATGT 


CAAATCTTAA 


1801 


TGAAAGCAGA 


TTTTGACCCA 


TACAATAATA 


TGACAAAATT 


GCTTCCAAAG 


1851 


AAAACATGGC 


TCTTATAGTG 


AAATATCGTT 


AGACTGTTAT 


AGAAAGATCT 


1901 


GAATTTATTT 


ATAAGAATAG 


TGTTTTTTTC 


TTTT CT TTTG 


ATATCTAAGG 


1951 


AGTAAAGCAA 


CCATGAATAG 


AAAAGGCTTA 


GTAACTATAT 


ATC.AAAGGAA 


2001 


TGGTGTTTTT 


TCTTTAAATA 


TGGATAAAAA 


TTTGTGAATA 


TAGAAGATTA 


2051 


GATCAATTAA 


CAAAGGTTAT 


GGTGGAGTGG 


TAAGCAGAGG 


CGGACCTATG 
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2101 TGTT ATAGTA 

2151 AAAAACCGAC 

2201 ATCATTTACG 

2251 AAGTTGGTCG 

2301 AAAAATATTG 

23 51 GTAATAAAAA 

2401 CAAGATACTA 

2451 TCTTTTATTT 

2 501 GACC AAAGTT 

2 551 GTCGATTTTT 
2601 TTTTTTAATA 
2651 AGTCGGTTTC 
2701 CATTTTTGCG 
2751 AAAAAAAATT 
2801 TTTTTGGTCG 
2851 GTTTTTGCCG 
2901 ATTTTGTATA 
2951 GnnGCACCCT 
3001 ACGTGTTCTC 
3051 CTTCTTCGTC 
3101 ATAG ACTCGT 
3151 TTCTCTATAA 
3201 CTTTCTCCAC 
3251 AAAAATAAAG 
3301 TTTGGATCCC 
3351 ACCCCACACG 
3401 CGTAGAAAAT 
3451 GTGTTATCTG 

3 501 GTAGTACTC A 
3551 C ATATTTTCC 
3601 ACAGGAAAAA 
3651 AAGTGGATGC 
3701 ATATTGCCAA 
3 751 TGACCATCTT 
3801 GGTGATGCTG 
3851 ATTCACGGAG 
3901 ACTTGGGTCA 
3 951 GTTACCAGGG 
4001 ATGGTTTGGA 
4051 TCTTTTGAG A 
4101 TGG ATTGTAC 



AGGGGTCACC 

CAACATTGGT 

TGTGAACGGT 

GAAATTACCG 

TAAAAAAAAA 

GATTCACTAT 

TTCTACCACT 

GATTTATACT 

GGTCGATTTT 

TTAAATGATC 

TTAATTTTTA 

TTGAAACATA 

CCAAAGAAAA 

TAAAAAATAT 

ATTTTTTGAC 

AATTTCTAGT 

TGTATATGTG 

GAATACTAGA 

GTCGCGTAAA 

CTTAATCAGA 

CTTTATAGCA 

ATACTCCTCA 

ATCACAGAAG 

AGTTTCTGTC 

CGTTTTCATT 

ATTCTTCGGT 

GCCATAGTCA 

GAATATACCT 

AACGCGGCAA 

GTTGTACGAT 

AATCTGGGCA 

TCAGCCTTGA 

CCCACCACGG 

TGCCCATCCA 

ATATCCGGGA 

ATATGGATCG 

TGTTGGCATC 

AGAATAGTTG 

TGGATAAATT 

CTGAATGAGC 

TGGTAGAATA 



CACTACTAGA 
CGGTAATGGC 
ATTTTTATGG 
ACCAACTTTG 
CCGACCAAAG 
CTGGGAATCG 
AGACCATTGG 
CTTTAATTAT 
ATTAAAAAGT 
CGCCGAATTA 
TTTATTTTAA 
AATTTCGCGG 
CCGACCAAAG 
ATTTTAAAAA 
CGACCAAAGT 
AGTGACCGAA 
TATATCCTTA 
AGCCTTTAGG 
AATACTTGGA 
GGTTTCGACT 
CCTTTTAATA 
AGCTTTCGGT 
TGAAAACAAA 
AAATTAAGTC 
ATTGGGGAGA 
CCTTACTAGG 
AGTCTCAATC 
ATCTTGTTTG 
CAGGAAGGCT 
GCATCTAAAC 
TTCCCAATTT 
TCCATTTCAT 
TTTCTTGAAC 
AGCTGTTGTC 
CGATCAACGG 
GATAAGTTGG 
TACCACTCCA 
CTGAACCAGA 
GCAGGCTCTA 
CCAAACAATG 
GATGATAGAC 



AATCCGGTAA 
CAAAAACTGA 
TCGGAAAGGA 
GTCGGTCAAT 
TTGATCGGTA 
AACCGGGGTC 
TTCATTTTGT 
ATTTTTGCAC 
AAAATTACTT 
ACCGACCAAT 
TTGAAAAACT 
GACTCAAAAA 
TTGGTCGGTT 
ACCGACCAAC 
TGGTCGGTCG 
CCCTGTAAGC 
AAATGATTAA 
GGCACTAGAT 
TCCGCCTATG 
TCGAGCTCCA 
AGACTATGAC 
TCTTCTCCAT 
ACAAGAAGAA 
CAATAGGGAA 
CCATCTAATT 
GTCGTAGAAC 
CTTTCCAACC 
GCATCATATG 
ATTCTTGAGA 
CATTAGAACC 
CCTGTTTTGG 
GAAATTCCTA 
TTCCTACCAC 
GGGTCACGAA 
GTTGTTATCG 
CCGGGACGGC 
GTGTACAAAA 
CCATGTTCCA 
AATTAATCCA 
TTGTTCATTG 
TCGAG 



AGATCGATCA 

CCAAAACGCG 

ATACCGACCA 

TAAATTCAAA 

TTTTAATTAT 

TGTACTATGG 

TTTAAGACTG 

GAAAATAACC 

ACCAAAGTTG 

TTTGGTAGGT 

AACCAAAGTT 

TAGTTTCCCG 

TCGTAAAAAA 

TTTAGTCGGT 

ACCTTGGTCG 

TTCGGGAGAA 

TTTAAAGAAC 

GAGCAGAATA 

ATGGTAAGTA 

GATATAAACT 

TTCATCTGAT 

TGTTCAGTTT 

GAAGAAGAAG 

AATGGAGCTG 

CATAAGACCA 

GACTTAGACG 

ATCGACTGAA 

TACCAATTGT 

ACGTACTTAA 

TTGCAAGGAA 

CAGATGAATG 

CTTCTATACA 

AATTCTCCAA 

ATTGGGTCTT 

GGCTTGTTCC 

GTAATTTTGG 

TAATGGGCTT 

TATTTGTCAA 

ATTGATTAAG 

TTGATCCTTT 
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Fig. 17A 

1 CATAATCAAA TGTGTGGTCT TATGTAGAAC TAATATTTGG TAATATTAGG 

51 CAAGTTGTTA TGTGACTTAT TTTATTCAAA AATATAATAA GAAGTTCAAA 

101 GAGAAGAGTA CAAGTAAGTA AGTAAGCAGA GACGAATCCT GGATTTAAAG 

151 GGTCTGGCTA TATTAATGTT TTTTTAATTT AAGCATTAGC GATTCGCCTT 

201 GCAAGTAATC GATAGGACAA AAGTTTTACC TTACTAATTC TATTGAGGCA 

251 CGAAATCCCT AT GAAAAAGC ATGTAAAATA TG AGAAGACG AAAGAATTAA 

301 ATAGGTTATA ATTATTGTAT AATTTATAAC ACACTTTATG ATAATATTAC 

351 AAATAAGAAT ATCGAATATT TAATTAATGA CGAACTATAA AAGCAAAGAA 

401 GGAAGGATGA GCTTCCAAAA ACAATCGCAA ATGAATAAAG ATGCCCAAAA 

4 51 TAGAGTAACC TAACGAAGTC GATACTTCCA TTCATAATCA AATCTGTTCA 

501 AAAACACTTG ATGGGTTATT TTTAACTTTA AGAGATGTAT CATATCGTCT 

551 CTTATTATTC CTTTAGGGCT ATTCGCCGTA GGAATAAAAT TTATATGATC 

601 AAATTTCACG TTATAT AAAT AATGTGA AGA AAAAACTTAT ACTTTTCAAG 

651 GTAACAAGAA ATCATGTTTT TTTTACGCCT TCGTGGAGAC TACTTCCTCG 

701 TAACAAAAAA TTAACATTTT AAGTGGCGAC TCTAAAAACT CGTGGCCAGT 

7 51 ATATTAGTCG CCATTAAACA TTATTTTTAA TCATGAGTTC TTTTCTTTTT 

801 TAATCTTTTT TTAAGGTCAA ATTTACCACT TTATCTTATT TATTTAAATT 

851 GAAAAATCCC AAATTTTGCA TTATTTTTTT GAATTCCTTT TTTTTTTACA 

901 CACTCAAAAA GTCAAAA CAT TAAAAAAACG AAATAGCAAA TTAAATGGCA 

951 AAAGACTTGT TGTAACAAAA AAAAAATAGT AAAACAGACT CATAAAAGGT 

1001 AACAATAACC AACAAATCAC ACAAAATTGT AGATAAATAT TATGCAAACA 

1051 AATAAAAATT AATAATCCAA TCCATTTATT TATTTTTTTA AAAAAAACCT 

1101 AAATTAACTC TCCATCTTTC AATCAAAAAC AAACTCTACC CATTTTTTTC 

1151 ACTATAAATA CTCTTCATAA TTTTCATTTG TTCTTCATTC CCATGTTTCT 

1201 TTTCTCCTTA TCC AAAAAAA AAAAAATTAA AAAAAA TTAT TTAGATTAAA 

12 51 TATCACTATC TGTCAAAGCC CAATCATT/^JX AATAAAATAA AAATTATGGA 

1301 TTATTCATCT . AATAAAAGTT CTCGTTGGGC TTTGCCAGTT ATCTTAGTTT 

1351 GCTTTTTTGT AATTTTATTA TCCAATAATG TTGTTTTTGC TTCTCATAAA 
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Fig. 17B 



1401 GTTTTTATTC ACTTGCAATC TCA7UVATGCC GTAAATGTTC ATACTGTTCA 

1451 TCGAACTGGT TATCATTTTC AGCCCGAAAA ACATTGGATC AATGGTATGT 

1501 TTATTCCTTT TTTTCGTCTT TTTTTTATAT ATATATATAT AATAAAACGA 

1551 ACATGTTGTG TTTAGTCTAG ATTTAATACT AGTGATTTTT TTGACGCTAA 

1601 CA/UVTAATCG AGTACTCACC ATTTGTCAAT AGATACATTG ACATGTATTA 

1651 GTATGATTTT CGTCTTTTTT CGTTGTTTCT AATATTATTT AATCTTCACT 

1701 AATTTTTTTA TTTTTCTTTG AATGATGTCT CTTGGTCAAA ACATACAATA 

1751 GATCCCAATG GTAAGTTAAC TATATTTTTG TATATTTTTT AAATTTATTT 

1801 TATTCTTATT ATATAATATA GGGAAAAAAG GATAAATATA TCCCCGAACT 

1851 ATTATAAATA GTATGCACCA GTATCCTCTG TTATACTTTA GAGATATTTT 

1901 TGCCGTCAAA AAACTAGAAC ACATATATCC TTTATTTATC CCGATATCGA 

1951 ATCGATTGTA CCACGAGTGA AGGGTATAGC TCTAGTTTTG GACGGTAGGG 

2001 CACCTAAAGT AGACGAAGA 
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